# ccec -O2 -std=c++17 -xcce --cce-aicore-arch=dav-c220 \
#     -I$ASCEND_HOME_PATH/compiler/tikcpp \
#     -I$ASCEND_HOME_PATH/compiler/tikcpp/tikcfw \
#     -I$ASCEND_HOME_PATH/compiler/tikcpp/tikcfw/impl \
#     -I$ASCEND_HOME_PATH/compiler/tikcpp/tikcfw/interface \
#     -I$ASCEND_HOME_PATH/include \
#     -I../../include -I../ \
#     -mllvm -cce-aicore-stack-size=0x8000 \
#     -mllvm -cce-aicore-function-stack-size=0x8000 \
#     -mllvm -cce-aicore-record-overflow=true \
#     -mllvm -cce-aicore-addr-transform \
#     -mllvm -cce-aicore-dcci-insert-for-scalar=false \
#     -L$ASCEND_HOME_PATH/lib64 \
#     -lruntime -lstdc++ -lascendcl -ltiling_api -lregister -lplatform -lascendalog -ldl \
#     -lascendc_runtime -lerror_manager -lprofapi -lge_common_base -lmmpa -lascend_dump -lc_sec \
#     -L$ASCEND_HOME_PATH/tools/simulator/Ascend910B3/lib \
#     -lnpu_drv -lnpu_drv_camodel -lstars -lffts -lruntime_camodel\
#     -lpem_davinci -lmodel_top -lmcu_wrapper -lmcu_loop \
#     LLMsGEMM_batch_QKTV_main.cpp -o LLMsGEMM_batch_QKTV